#!/usr/bin/env bash

# Train and test STAViS audiovisual models for all splits

base_path='./experiments'

# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./visual_multi_test1/split1_results \
#     --dataset split${split} \
#     --pool_layer "avgpool" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "pyramid, avgpool, dsam module" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 20 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=2
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./visual_multi_test/split2_results \
#     --dataset split${split} \
#     --pool_layer "avgpool" \
#     --learning_rate 0.01 \
#     --upsample_func "bilinear" \
#     --explain "pyramid, avgpool, dsam module" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 10 --n_epochs 40 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=3
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./visual_multi_test1/split3_results \
#     --dataset split${split} \
#     --pool_layer "avgpool" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "pyramid, avgpool, dsam module" \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 20 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt


# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./visual_multi_test2/split1_results \
#     --dataset split${split} \
#     --pool_layer "avgpool" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "pyramid, avgpool, no_use_dsam_multiScale" \
#     --no_use_dsam_multiScale \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 20 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=2
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./visual_multi_test2/split2_results \
#     --dataset split${split} \
#     --pool_layer "avgpool" \
#     --learning_rate 0.01 \
#     --upsample_func "bilinear" \
#     --explain "pyramid, avgpool, no_use_dsam_multiScale" \
#     --no_use_dsam_multiScale \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 10 --n_epochs 40 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=3
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./visual_multi_test2/split3_results \
#     --dataset split${split} \
#     --pool_layer "avgpool" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "pyramid, avgpool, no_use_dsam_multiScale" \
#     --no_use_dsam_multiScale \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 20 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# # no_use_dsam_multiScale and no_use_dsam_att
# split=1
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./visual_multi_test3/split1_results \
#     --dataset split${split} \
#     --pool_layer "avgpool" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "pyramid, avgpool, no_use_dsam_multiScale, no_use_dsam_att" \
#     --no_use_dsam_multiScale \
#     --no_use_dsam_att \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 20 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=2
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./visual_multi_test3/split2_results \
#     --dataset split${split} \
#     --pool_layer "avgpool" \
#     --learning_rate 0.01 \
#     --upsample_func "bilinear" \
#     --explain "pyramid, avgpool, no_use_dsam_multiScale, no_use_dsam_att" \
#     --no_use_dsam_multiScale \
#     --no_use_dsam_att \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 10 --n_epochs 40 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

# split=3
# python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
#     --result_path ./visual_multi_test3/split3_results \
#     --dataset split${split} \
#     --pool_layer "avgpool" \
#     --learning_rate 0.01 \
#     --temp_reduction 2 \
#     --upsample_func "bilinear" \
#     --explain "pyramid, avgpool, no_use_dsam_multiScale, no_use_dsam_att" \
#     --no_use_dsam_multiScale \
#     --no_use_dsam_att \
#     --no_use_transposeConv \
#     --no_use_spatio_att \
#     --audiovisual "" --checkpoint 20 --n_epochs 60 \
#     --root_path ${base_path} \
#     --pretrain_path ./data/pretrained_models/resnet-50-kinetics.pth \
#     --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
#   	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
#   	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
#   	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
#   	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
#   	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
#   	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
#   	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
#   	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
#   	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt


# python eval_multiprocess.py --base_path /media/Diskd/projects/STAViS_AV \
# --eval_path experiments/visual_multi_test1

# python eval_multiprocess.py --base_path /media/Diskd/projects/STAViS_AV \
# --eval_path experiments/visual_multi_test2

# python eval_multiprocess.py --base_path /media/Diskd/projects/STAViS_AV \
# --eval_path experiments/visual_multi_test3

split=1
python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
    --result_path ./audiovisual_complete_test1/split1_results \
    --dataset split${split} \
    --pool_layer "avgpool" \
    --learning_rate 0.001 \
    --temp_reduction 2 \
    --upsample_func "bilinear" \
    --explain "original audio visual pyramid, avgpool, dsam module" \
    --no_use_transposeConv \
    --no_use_spatio_att \
    --audiovisual True --checkpoint 20 --n_epochs 40 \
    --root_path ${base_path} \
    --pretrain_path ./experiments/visual_multi_test1/split1_results/save_best_WoFuse.pth \
    --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
  	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
  	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
  	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
  	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
  	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
  	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
  	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
  	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
  	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
  	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

split=2
python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
    --result_path ./audiovisual_complete_test1/split2_results \
    --dataset split${split} \
    --pool_layer "avgpool" \
    --learning_rate 0.001 \
    --temp_reduction 2 \
    --upsample_func "bilinear" \
    --explain "original audio visual pyramid, avgpool, dsam module" \
    --no_use_transposeConv \
    --no_use_spatio_att \
    --audiovisual True --checkpoint 20 --n_epochs 40 \
    --root_path ${base_path} \
    --pretrain_path ./experiments/visual_multi_test1/split2_results/save_best_WoFuse.pth \
    --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
  	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
  	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
  	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
  	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
  	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
  	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
  	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
  	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
  	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
  	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

split=3
python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
    --result_path ./audiovisual_complete_test1/split3_results \
    --dataset split${split} \
    --pool_layer "avgpool" \
    --learning_rate 0.001 \
    --temp_reduction 2 \
    --upsample_func "bilinear" \
    --explain "original audio visual pyramid, avgpool, dsam module" \
    --no_use_transposeConv \
    --no_use_spatio_att \
    --audiovisual True --checkpoint 20 --n_epochs 40 \
    --root_path ${base_path} \
    --pretrain_path ./experiments/visual_multi_test1/split3_results/save_best_WoFuse.pth \
    --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
  	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
  	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
  	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
  	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
  	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
  	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
  	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
  	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
  	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
  	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

split=1
python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
    --result_path ./audiovisual_complete_test/split1_results \
    --dataset split${split} \
    --pool_layer "avgpool" \
    --learning_rate 0.01 \
    --temp_reduction 2 \
    --upsample_func "bilinear" \
    --explain "audio visual pyramid, av hidden=256, avgpool, dsam module" \
    --use_transformer \
    --av_hidden_size 256 \
    --num_heads 8 \
    --attn_dropout 0.1 \
    --lr_transformer 0.001 \
    --no_use_transposeConv \
    --no_use_spatio_att \
    --audiovisual True --checkpoint 20 --n_epochs 40 \
    --root_path ${base_path} \
    --pretrain_path ./experiments/visual_multi_test1/split1_results/save_best_WoFuse.pth \
    --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
  	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
  	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
  	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
  	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
  	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
  	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
  	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
  	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
  	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
  	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

split=2
python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
    --result_path ./audiovisual_complete_test/split2_results \
    --dataset split${split} \
    --pool_layer "avgpool" \
    --learning_rate 0.01 \
    --upsample_func "bilinear" \
    --explain "audio visual pyramid, avgpool, dsam module" \
    --use_transformer \
    --av_hidden_size 256 \
    --num_heads 8 \
    --attn_dropout 0.1 \
    --lr_transformer 0.001 \
    --no_use_transposeConv \
    --no_use_spatio_att \
    --audiovisual True --checkpoint 20 --n_epochs 40 \
    --root_path ${base_path} \
    --pretrain_path ./experiments/visual_multi_test1/split2_results/save_best_WoFuse.pth \
    --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
  	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
  	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
  	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
  	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
  	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
  	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
  	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
  	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
  	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
  	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

split=3
python main.py --gpu_devices 0,1 --batch_size 128 --n_threads 12 \
    --result_path ./audiovisual_complete_test/split3_results \
    --dataset split${split} \
    --pool_layer "avgpool" \
    --learning_rate 0.01 \
    --temp_reduction 2 \
    --upsample_func "bilinear" \
    --explain "audio visual pyramid, avgpool, dsam module" \
    --use_transformer \
    --av_hidden_size 256 \
    --num_heads 8 \
    --attn_dropout 0.1 \
    --lr_transformer 0.001 \
    --no_use_transposeConv \
    --no_use_spatio_att \
    --audiovisual True --checkpoint 20 --n_epochs 40 \
    --root_path ${base_path} \
    --pretrain_path ./experiments/visual_multi_test1/split3_results/save_best_WoFuse.pth \
    --audio_pretrain_path ./data/pretrained_models/soundnet8.pth \
  	--annotation_path_coutrot1_train ./data/fold_lists/Coutrot_db1_list_train_${split}_fps.txt \
  	--annotation_path_coutrot1_test ./data/fold_lists/Coutrot_db1_list_test_${split}_fps.txt \
  	--annotation_path_coutrot2_train ./data/fold_lists/Coutrot_db2_list_train_${split}_fps.txt \
  	--annotation_path_coutrot2_test ./data/fold_lists/Coutrot_db2_list_test_${split}_fps.txt \
  	--annotation_path_summe_train ./data/fold_lists/SumMe_list_train_${split}_fps.txt \
  	--annotation_path_summe_test ./data/fold_lists/SumMe_list_test_${split}_fps.txt \
  	--annotation_path_etmd_train ./data/fold_lists/ETMD_av_list_train_${split}_fps.txt \
  	--annotation_path_etmd_test ./data/fold_lists/ETMD_av_list_test_${split}_fps.txt \
  	--annotation_path_avad_train ./data/fold_lists/AVAD_list_train_${split}_fps.txt \
  	--annotation_path_avad_test ./data/fold_lists/AVAD_list_test_${split}_fps.txt

python eval_multiprocess.py --base_path /media/Diskd/projects/STAViS_AV \
--eval_path experiments/audiovisual_complete_test

python eval_multiprocess.py --base_path /media/Diskd/projects/STAViS_AV \
--eval_path experiments/audiovisual_complete_test1